1
|
3 |
|
import Token, { TokenType } from './Token' |
2
|
|
|
|
3
|
3 |
|
const OPERATORS = { |
4
|
|
|
'+': 'add', |
5
|
|
|
'-': 'sub', |
6
|
|
|
'*': 'mul', |
7
|
|
|
'/': 'div', |
8
|
|
|
'**': 'pow', |
9
|
|
|
'^': 'pow', |
10
|
|
|
'=': 'set', |
11
|
|
|
'==': 'equals', |
12
|
|
|
'<': 'isLessThan', |
13
|
|
|
'>': 'isGreaterThan', |
14
|
|
|
} |
15
|
|
|
|
16
|
|
|
/** |
17
|
|
|
* @class Lexer |
18
|
|
|
* @name Lexer |
19
|
|
|
*/ |
20
|
3 |
|
export class Lexer { |
21
|
|
|
s: string |
22
|
|
|
|
23
|
|
|
/** |
24
|
|
|
* Initialize a lexer. |
25
|
|
|
*/ |
26
|
|
|
constructor(input: string) { |
27
|
16 |
|
this.s = input |
28
|
|
|
} |
29
|
|
|
|
30
|
|
|
/** |
31
|
|
|
* Yields tokens as they are lexed. |
32
|
|
|
* |
33
|
|
|
*/ |
34
|
|
|
*lex(): Generator<Token> { |
35
|
14 |
|
let onSpace = false |
36
|
14 |
|
let onInteger = false |
37
|
14 |
|
let onWord = false |
38
|
14 |
|
let onOperator = false |
39
|
14 |
|
let buffer = '' |
40
|
|
|
|
41
|
|
|
// for each character |
42
|
14 |
|
for (let i = 0; i < this.s.length; i++) { |
43
|
59 |
|
const char = this.s[i] ?? '?' |
44
|
|
|
|
45
|
|
|
// if a space, combine with subsequent spaces into a separator |
46
|
59 |
|
if (/^\s$/.exec(char)) { |
47
|
12 |
|
if (onInteger) { |
48
|
4 |
|
yield new Token(TokenType.literal, buffer) |
49
|
4 |
|
onInteger = false |
50
|
4 |
|
buffer = '' |
51
|
8 |
|
} else if (onWord) { |
52
|
2 |
|
yield new Token(TokenType.identifier, buffer) |
53
|
2 |
|
onWord = false |
54
|
2 |
|
buffer = '' |
55
|
|
|
} |
56
|
12 |
|
onSpace = true |
57
|
12 |
|
buffer += char |
58
|
12 |
|
continue |
59
|
47 |
|
} else if (onSpace) { |
60
|
7 |
|
yield new Token(TokenType.separator, '') |
61
|
7 |
|
onSpace = false |
62
|
7 |
|
buffer = '' |
63
|
|
|
} |
64
|
|
|
|
65
|
|
|
// if a digit, combine with subsequent digits into a literal |
66
|
47 |
|
if (/^\d$/.exec(char)) { |
67
|
14 |
|
if (!onWord) { |
68
|
11 |
|
onInteger = true |
69
|
|
|
} |
70
|
14 |
|
buffer += char |
71
|
14 |
|
continue |
72
|
33 |
|
} else if (onInteger) { |
73
|
1 |
|
yield new Token(TokenType.literal, buffer) |
74
|
1 |
|
onInteger = false |
75
|
1 |
|
buffer = '' |
76
|
|
|
} |
77
|
|
|
|
78
|
|
|
// if a letter, combine with subsequent letters/numbers into an identifier |
79
|
33 |
|
if (/^[a-z]$/.exec(char) || (onWord && /^\d$/.exec(char))) { |
80
|
26 |
|
onWord = true |
81
|
26 |
|
buffer += char |
82
|
26 |
|
continue |
83
|
7 |
|
} else if (onWord) { |
84
|
1 |
|
yield new Token(TokenType.identifier, buffer) |
85
|
1 |
|
onWord = false |
86
|
1 |
|
buffer = '' |
87
|
|
|
} |
88
|
|
|
|
89
|
|
|
// if another char, combine with subsequent char and match an operator |
90
|
7 |
|
buffer += char |
91
|
7 |
|
if (buffer in OPERATORS) { |
92
|
3 |
|
yield new Token(TokenType.operator, buffer) |
93
|
3 |
|
onOperator = false |
94
|
3 |
|
buffer = '' |
95
|
3 |
|
continue |
96
|
|
|
} |
97
|
4 |
|
if (onOperator) { |
98
|
2 |
|
throw `Invalid operator "${buffer}"` |
99
|
|
|
} |
100
|
2 |
|
onOperator = true |
101
|
|
|
} |
102
|
|
|
|
103
|
12 |
|
if (onSpace) { |
104
|
3 |
|
yield new Token(TokenType.separator, '') |
105
|
|
|
} |
106
|
|
|
|
107
|
12 |
|
if (onInteger) { |
108
|
3 |
|
yield new Token(TokenType.literal, buffer) |
109
|
|
|
} |
110
|
|
|
|
111
|
12 |
|
if (onWord) { |
112
|
6 |
|
yield new Token(TokenType.identifier, buffer) |
113
|
|
|
} |
114
|
|
|
} |
115
|
|
|
} |
116
|
|
|
|
117
|
|
|
export default Lexer |
118
|
|
|
|